package com.gapp.gvoa.parser;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import android.util.Log;
import com.gapp.gvoa.datatype.RssItem;
import com.gapp.gvoa.util.NetworkUtil;
public class ItemHtmlParser {
public static final String tag = "ItemHtmlParser";
public static void parseItemDetail(RssItem item) throws Exception
{
/*
if(null==item.getLink())
{
return;
}*/
//String testurl ="http://www.51voa.com/VOA_Standard_English/us-weighs-boosting-training-for-syrian-rebels-52551.html";
String respContent = NetworkUtil.httpGetContent(item.getLink());
Document doc = Jsoup.parse(respContent);
Element mp3link = doc.select("a[id=mp3]").first();
if(mp3link!=null)
{
Log.i(tag,mp3link.attr("href"));
item.setMp3url(mp3link.attr("href"));
}
else
{
Log.i(tag,"can't get mp3");
}
Element content = doc.getElementById("content");
Element imageEl = content.select("div.contentImage").first();
if (imageEl!=null)
{
Log.i(tag,"remove image element from content");
imageEl.remove();
}
String contentStr= content.html();
Log.i(tag,contentStr);
item.setFullText(contentStr);
Element lrclink = content.select("a[id=lrc]").first();
if(lrclink != null)
{
Log.i(tag,lrclink.attr("href"));
}
item.setStatus(RssItem.E_PARSE_TXT_OK);
return ;
}
}